"""
创建语料
"""


from prepar_corpus import process, process_by_word, process_xiaohuangji
from prepar_corpus.prepar_recall_corpus.recall_corpus import process_recall_corpus
from prepar_corpus.prepar_sort_corpus.sort_corpus import process_sort_corpus


if __name__ == '__main__':
    # process()
    # process_by_word()
    # process_xiaohuangji(by_word=True)
    # process_recall_corpus()
    # process_sort_corpus()  # 按词语切分太慢，之后都只用按单个字进行切分的数据
    process_sort_corpus(by_word=True)
